{"nbformat":4,"nbformat_minor":0,"metadata":{"colab":{"provenance":[{"file_id":"1yZcAvzPRSAOGBxYDVgtDywAJgZmGD8AG","timestamp":1689538072188},{"file_id":"1wyzuYfVsl5mPnzGzJGqKODItBOK8Nj46","timestamp":1689536289631}],"machine_shape":"hm","gpuType":"A100","authorship_tag":"ABX9TyPqYV7Y8H9Wv0OoqgIE+vi1"},"kernelspec":{"name":"python3","display_name":"Python 3"},"language_info":{"name":"python"},"widgets":{"application/vnd.jupyter.widget-state+json":{"fa0e7bbe536e472e9991d863b102f15a":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_01c27f695e3b470fba5238e264e4ad07","IPY_MODEL_20762690419a448eaf47b1cb70530055","IPY_MODEL_7d512d43a0e64302ac129fe66cba6ee1"],"layout":"IPY_MODEL_8731d4e7053c490c8a9c5c6860a4e8fb"}},"01c27f695e3b470fba5238e264e4ad07":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_7bffbeb0ad304836b96f54e02285aaee","placeholder":"​","style":"IPY_MODEL_ad874c3f37f246d2a8005a93bc4a85b6","value":"Downloading (…)okenizer_config.json: 100%"}},"20762690419a448eaf47b1cb70530055":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_6ef83f585f3f4f68bc659040a4bea134","max":270,"min":0,"orientation":"horizontal","style":"IPY_MODEL_fbe3297c1ca64ccc85a5326a93e40259","value":270}},"7d512d43a0e64302ac129fe66cba6ee1":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_edf64acf2d614d018e9f4a16261c4adc","placeholder":"​","style":"IPY_MODEL_a8b86a8c5a75478d92cc8a071bc74bbe","value":" 270/270 [00:00&lt;00:00, 22.4kB/s]"}},"8731d4e7053c490c8a9c5c6860a4e8fb":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"7bffbeb0ad304836b96f54e02285aaee":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"ad874c3f37f246d2a8005a93bc4a85b6":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"6ef83f585f3f4f68bc659040a4bea134":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"fbe3297c1ca64ccc85a5326a93e40259":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"edf64acf2d614d018e9f4a16261c4adc":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"a8b86a8c5a75478d92cc8a071bc74bbe":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"3bbe895893e148f9896676a31a88f3fc":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_09f9d26f420f4dec84ba34f11b80b73f","IPY_MODEL_7c4799db0f364ac5baa8a7987b44149a","IPY_MODEL_be1640e664c44df7b6fd0549fb12a4c3"],"layout":"IPY_MODEL_355ab8d20c0f43b4bda4ed533a4edcd3"}},"09f9d26f420f4dec84ba34f11b80b73f":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_57f36ed86b6c4809971337eaa8d964a3","placeholder":"​","style":"IPY_MODEL_eac29d2974604951ba63f8e65675172e","value":"Downloading (…)lve/main/config.json: 100%"}},"7c4799db0f364ac5baa8a7987b44149a":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_ed19c56b20ba4cc088e85a25bf1d1e4e","max":570,"min":0,"orientation":"horizontal","style":"IPY_MODEL_5ab8f35107cd49df9e2fe7d17ccc0a42","value":570}},"be1640e664c44df7b6fd0549fb12a4c3":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_a1616fad62924db78e443a8b93047265","placeholder":"​","style":"IPY_MODEL_5510ec05edc14e43a994498161bae651","value":" 570/570 [00:00&lt;00:00, 49.1kB/s]"}},"355ab8d20c0f43b4bda4ed533a4edcd3":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"57f36ed86b6c4809971337eaa8d964a3":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"eac29d2974604951ba63f8e65675172e":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ed19c56b20ba4cc088e85a25bf1d1e4e":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5ab8f35107cd49df9e2fe7d17ccc0a42":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"a1616fad62924db78e443a8b93047265":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5510ec05edc14e43a994498161bae651":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ec32948c16b3443d8db3bf12a098c15a":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_5abe34cfd1df41d093a1c1d4b62388a6","IPY_MODEL_e41f1757c1d9492da1d9c8f6e80d4874","IPY_MODEL_b143d106dda74054bf568f5490099766"],"layout":"IPY_MODEL_f21140dc2d85407ea2a487b93aacbc5b"}},"5abe34cfd1df41d093a1c1d4b62388a6":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_7062c6b8509543bc97d15efb009b98e2","placeholder":"​","style":"IPY_MODEL_cf3493e5beb2455a9e2c92e670ab7c06","value":"Downloading (…)solve/main/vocab.txt: 100%"}},"e41f1757c1d9492da1d9c8f6e80d4874":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_5dfd63859f784b09b0ab43fe51b616b0","max":223843,"min":0,"orientation":"horizontal","style":"IPY_MODEL_28fd7936d80a49fa811210d21baeaf75","value":223843}},"b143d106dda74054bf568f5490099766":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_b4eeb0aca28d41dd813f389b654b88b8","placeholder":"​","style":"IPY_MODEL_5b7c1ed7646d4bd0bca9005d3000fd4b","value":" 224k/224k [00:00&lt;00:00, 525kB/s]"}},"f21140dc2d85407ea2a487b93aacbc5b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"7062c6b8509543bc97d15efb009b98e2":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"cf3493e5beb2455a9e2c92e670ab7c06":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"5dfd63859f784b09b0ab43fe51b616b0":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"28fd7936d80a49fa811210d21baeaf75":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"b4eeb0aca28d41dd813f389b654b88b8":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5b7c1ed7646d4bd0bca9005d3000fd4b":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"618482e958f74bac8e637341c5ebc441":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_cf10d626a08647dcaf12bb0d2425277c","IPY_MODEL_5ca5da6e43e24c0a98053c8201b1fe7d","IPY_MODEL_5e829560c52849e187db0ed094acdf0a"],"layout":"IPY_MODEL_1a7842e0efa24abeba6e1675583b8dd7"}},"cf10d626a08647dcaf12bb0d2425277c":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_adc12fc45aaf48c6bcb24c8238abf300","placeholder":"​","style":"IPY_MODEL_a19c0cf31c3c4aeeb336c28cfc6762bb","value":"Downloading (…)/main/tokenizer.json: 100%"}},"5ca5da6e43e24c0a98053c8201b1fe7d":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_f8e885cca8144136a341edb9dcf53f95","max":454226,"min":0,"orientation":"horizontal","style":"IPY_MODEL_b526ff073a844b259458d5abc24665d4","value":454226}},"5e829560c52849e187db0ed094acdf0a":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_d7e3906709ef4ef1a6d20d5edb9c5bd3","placeholder":"​","style":"IPY_MODEL_07b2452e6b3c406581d8405ed29dbfc2","value":" 454k/454k [00:00&lt;00:00, 1.06MB/s]"}},"1a7842e0efa24abeba6e1675583b8dd7":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"adc12fc45aaf48c6bcb24c8238abf300":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"a19c0cf31c3c4aeeb336c28cfc6762bb":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"f8e885cca8144136a341edb9dcf53f95":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"b526ff073a844b259458d5abc24665d4":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"d7e3906709ef4ef1a6d20d5edb9c5bd3":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"07b2452e6b3c406581d8405ed29dbfc2":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"a0a5467f1be14cf9b271995c8467d98c":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_90f480c849604618802a970439c004a3","IPY_MODEL_c8694078b30c46af824862c6d5604e26","IPY_MODEL_6eecdb3ddbca44e889995bba4143083a"],"layout":"IPY_MODEL_d115a88dc64248c990319b2b2a95367a"}},"90f480c849604618802a970439c004a3":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_264e8dd132844f55b69841415a8b819d","placeholder":"​","style":"IPY_MODEL_94e0cb53a5324b17965b40f76ddf5f48","value":"Downloading (…)cial_tokens_map.json: 100%"}},"c8694078b30c46af824862c6d5604e26":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_680058a58f0747e58ccee1c3f59b5d43","max":112,"min":0,"orientation":"horizontal","style":"IPY_MODEL_5c23b40e9f2d4797840683184078a693","value":112}},"6eecdb3ddbca44e889995bba4143083a":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_5c9ae4a0298c44ab881a5fac1e6be3e7","placeholder":"​","style":"IPY_MODEL_99eb5ff7212b4bf9ada29956e7327fcd","value":" 112/112 [00:00&lt;00:00, 9.06kB/s]"}},"d115a88dc64248c990319b2b2a95367a":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"264e8dd132844f55b69841415a8b819d":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"94e0cb53a5324b17965b40f76ddf5f48":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"680058a58f0747e58ccee1c3f59b5d43":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5c23b40e9f2d4797840683184078a693":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"5c9ae4a0298c44ab881a5fac1e6be3e7":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"99eb5ff7212b4bf9ada29956e7327fcd":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ea15658f530a40a0a3ee74d76c415b95":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_3d7d2ab0105d446db11421900ff92908","IPY_MODEL_aa6b7143dbda4165805f21e9b47119d0","IPY_MODEL_c9db5f9857414a518e58127bbf331d58"],"layout":"IPY_MODEL_717c53fc2a8c47e6a85428b6c2f13b0d"}},"3d7d2ab0105d446db11421900ff92908":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_836a82a00fee45c5bdb807b632a6fd18","placeholder":"​","style":"IPY_MODEL_949b5d5e19ac4058a6c3aae95f147d0f","value":"Map:  99%"}},"aa6b7143dbda4165805f21e9b47119d0":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"","description":"","description_tooltip":null,"layout":"IPY_MODEL_868c8bb1089f45d9b49817017ad1fa39","max":21924,"min":0,"orientation":"horizontal","style":"IPY_MODEL_73b7d4338ce241fca51d26baf1a7c94c","value":21924}},"c9db5f9857414a518e58127bbf331d58":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_ae28dc20466446b6ba1fae25ab31e22b","placeholder":"​","style":"IPY_MODEL_f224a49d51d3485d9173ad23ee7a8fa3","value":" 21799/21924 [00:13&lt;00:00, 1822.69 examples/s]"}},"717c53fc2a8c47e6a85428b6c2f13b0d":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":"hidden","width":null}},"836a82a00fee45c5bdb807b632a6fd18":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"949b5d5e19ac4058a6c3aae95f147d0f":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"868c8bb1089f45d9b49817017ad1fa39":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"73b7d4338ce241fca51d26baf1a7c94c":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"ae28dc20466446b6ba1fae25ab31e22b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"f224a49d51d3485d9173ad23ee7a8fa3":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"b6930f727faf4af5ac6103f34a0728a3":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_7e4d704ccfbb413aac17080649470991","IPY_MODEL_a950da66aac144b2a2e98d7861b63fa1","IPY_MODEL_689c1e20ba9342dca8a7a8806fdcae8f"],"layout":"IPY_MODEL_19898c6fdb57427a80263af18f762c22"}},"7e4d704ccfbb413aac17080649470991":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_4dab1258e1b44bc99d2714b00b89aa2f","placeholder":"​","style":"IPY_MODEL_5138c07602404491adbd286a0ac19bb6","value":"Map: 100%"}},"a950da66aac144b2a2e98d7861b63fa1":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"","description":"","description_tooltip":null,"layout":"IPY_MODEL_97133fcbd22e4f6d835ad29b8517a3d0","max":648,"min":0,"orientation":"horizontal","style":"IPY_MODEL_adeb4ca8368c4f64a451ba708c8614f2","value":648}},"689c1e20ba9342dca8a7a8806fdcae8f":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_df8e65d254d44e1cb4147514915fbb30","placeholder":"​","style":"IPY_MODEL_5df370321ba244e0b778790e8a2d9a10","value":" 648/648 [00:00&lt;00:00, 804.21 examples/s]"}},"19898c6fdb57427a80263af18f762c22":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":"hidden","width":null}},"4dab1258e1b44bc99d2714b00b89aa2f":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5138c07602404491adbd286a0ac19bb6":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"97133fcbd22e4f6d835ad29b8517a3d0":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"adeb4ca8368c4f64a451ba708c8614f2":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"df8e65d254d44e1cb4147514915fbb30":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5df370321ba244e0b778790e8a2d9a10":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ac678daee17c4572a15387f65cf3a2e6":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_5263dc3f385a450eb304e909dd53d37e","IPY_MODEL_1acac7477f36498a8763ce3aca41975e","IPY_MODEL_6bfeb527c31c4741945917d4243246cc"],"layout":"IPY_MODEL_fa6fd522a99e46e0a10ca64f4aa6d6cb"}},"5263dc3f385a450eb304e909dd53d37e":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_e171724c11814192bf84273c89402b34","placeholder":"​","style":"IPY_MODEL_64e6581e50e84e8685e5a4db09c5cbfd","value":"Map:  97%"}},"1acac7477f36498a8763ce3aca41975e":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"","description":"","description_tooltip":null,"layout":"IPY_MODEL_e1a3c9180cab45a489a2d17a34b0eb5c","max":1296,"min":0,"orientation":"horizontal","style":"IPY_MODEL_0a22ab96872644c09c079521ff278772","value":1296}},"6bfeb527c31c4741945917d4243246cc":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_7568c3a49c0b4d349e36348c72dd1d10","placeholder":"​","style":"IPY_MODEL_00a4100953824e36a5a74585539d4aba","value":" 1260/1296 [00:01&lt;00:00, 803.56 examples/s]"}},"fa6fd522a99e46e0a10ca64f4aa6d6cb":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":"hidden","width":null}},"e171724c11814192bf84273c89402b34":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"64e6581e50e84e8685e5a4db09c5cbfd":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"e1a3c9180cab45a489a2d17a34b0eb5c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"0a22ab96872644c09c079521ff278772":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"7568c3a49c0b4d349e36348c72dd1d10":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"00a4100953824e36a5a74585539d4aba":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"3d4245e6a02745e49da814c0d21d50f0":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_0cb68ca00dd343dd9488f0ef41ac9177","IPY_MODEL_4753e3cf5f114096a7a2acde48b117ea","IPY_MODEL_3ea79cb1ee8646019cce3e161c0d57b1"],"layout":"IPY_MODEL_b9524ffbcb6c449cba0ed72640bfb8e1"}},"0cb68ca00dd343dd9488f0ef41ac9177":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_45343b2d50c846d09329377d993eec4e","placeholder":"​","style":"IPY_MODEL_5896c18516fe46f6bab83d226cfa2fee","value":"Downloading pytorch_model.bin: 100%"}},"4753e3cf5f114096a7a2acde48b117ea":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_6a3f4f35966444cda8a127373bbec506","max":436541650,"min":0,"orientation":"horizontal","style":"IPY_MODEL_b86e8c343bd24eee83256ed92f91561d","value":436541650}},"3ea79cb1ee8646019cce3e161c0d57b1":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_0396ab496b2b4819aaa6b4e5a8f85078","placeholder":"​","style":"IPY_MODEL_62ab062e6d424c45aca01945e179070c","value":" 437M/437M [00:26&lt;00:00, 15.1MB/s]"}},"b9524ffbcb6c449cba0ed72640bfb8e1":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"45343b2d50c846d09329377d993eec4e":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5896c18516fe46f6bab83d226cfa2fee":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"6a3f4f35966444cda8a127373bbec506":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"b86e8c343bd24eee83256ed92f91561d":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"0396ab496b2b4819aaa6b4e5a8f85078":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"62ab062e6d424c45aca01945e179070c":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"9a905030128747dda71e544a218f83c1":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_2cff427ff3ef4e6982d2dfbd9232d0c3","IPY_MODEL_a3f94b85301b491886a9f83b16aeac63","IPY_MODEL_4a8472d9c15443039b3053e96a6a6d41"],"layout":"IPY_MODEL_8e459af962f14b41bf8c992c5f3ab411"}},"2cff427ff3ef4e6982d2dfbd9232d0c3":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_4deb011fc31e44b88c800d91e5f6a93d","placeholder":"​","style":"IPY_MODEL_e5da6ee403d040cbb2faba0a8bd81d22","value":"Map:  99%"}},"a3f94b85301b491886a9f83b16aeac63":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"","description":"","description_tooltip":null,"layout":"IPY_MODEL_a79e7053b6aa438bbfc03539a5ce95af","max":23868,"min":0,"orientation":"horizontal","style":"IPY_MODEL_320e848473244e59aef9b1e400b09f1b","value":23868}},"4a8472d9c15443039b3053e96a6a6d41":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_a13768a4c8894e2d88ea4ec1afd46bd2","placeholder":"​","style":"IPY_MODEL_f556bf7e32ba407199f139746e5415ff","value":" 23681/23868 [00:19&lt;00:00, 1515.99 examples/s]"}},"8e459af962f14b41bf8c992c5f3ab411":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":"hidden","width":null}},"4deb011fc31e44b88c800d91e5f6a93d":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e5da6ee403d040cbb2faba0a8bd81d22":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"a79e7053b6aa438bbfc03539a5ce95af":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"320e848473244e59aef9b1e400b09f1b":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"a13768a4c8894e2d88ea4ec1afd46bd2":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"f556bf7e32ba407199f139746e5415ff":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}}}},"accelerator":"GPU"},"cells":[{"cell_type":"code","execution_count":1,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"scKll44AuD1v","executionInfo":{"status":"ok","timestamp":1689538324504,"user_tz":420,"elapsed":20684,"user":{"displayName":"Yu Wang","userId":"02802289530208391889"}},"outputId":"c7c5f27d-2269-4bdd-c386-5e33d56eff9c"},"outputs":[{"output_type":"stream","name":"stdout","text":["Collecting transformers==4.28.0\n","  Downloading transformers-4.28.0-py3-none-any.whl (7.0 MB)\n","\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.0/7.0 MB\u001b[0m \u001b[31m54.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers==4.28.0) (3.12.2)\n","Collecting huggingface-hub<1.0,>=0.11.0 (from transformers==4.28.0)\n","  Downloading huggingface_hub-0.16.4-py3-none-any.whl (268 kB)\n","\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m268.8/268.8 kB\u001b[0m \u001b[31m38.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers==4.28.0) (1.22.4)\n","Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers==4.28.0) (23.1)\n","Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers==4.28.0) (6.0)\n","Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers==4.28.0) (2022.10.31)\n","Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers==4.28.0) (2.27.1)\n","Collecting tokenizers!=0.11.3,<0.14,>=0.11.1 (from transformers==4.28.0)\n","  Downloading tokenizers-0.13.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.8 MB)\n","\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.8/7.8 MB\u001b[0m \u001b[31m48.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers==4.28.0) (4.65.0)\n","Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.11.0->transformers==4.28.0) (2023.6.0)\n","Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.11.0->transformers==4.28.0) (4.7.1)\n","Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.28.0) (1.26.16)\n","Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.28.0) (2023.5.7)\n","Requirement already satisfied: charset-normalizer~=2.0.0 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.28.0) (2.0.12)\n","Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.28.0) (3.4)\n","Installing collected packages: tokenizers, huggingface-hub, transformers\n","Successfully installed huggingface-hub-0.16.4 tokenizers-0.13.3 transformers-4.28.0\n","Collecting datasets\n","  Downloading datasets-2.13.1-py3-none-any.whl (486 kB)\n","\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m486.2/486.2 kB\u001b[0m \u001b[31m32.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from datasets) (1.22.4)\n","Requirement already satisfied: pyarrow>=8.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (9.0.0)\n","Collecting dill<0.3.7,>=0.3.0 (from datasets)\n","  Downloading dill-0.3.6-py3-none-any.whl (110 kB)\n","\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m110.5/110.5 kB\u001b[0m \u001b[31m18.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from datasets) (1.5.3)\n","Requirement already satisfied: requests>=2.19.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (2.27.1)\n","Requirement already satisfied: tqdm>=4.62.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (4.65.0)\n","Collecting xxhash (from datasets)\n","  Downloading xxhash-3.2.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (212 kB)\n","\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m212.5/212.5 kB\u001b[0m \u001b[31m29.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting multiprocess (from datasets)\n","  Downloading multiprocess-0.70.14-py310-none-any.whl (134 kB)\n","\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.3/134.3 kB\u001b[0m \u001b[31m22.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: fsspec[http]>=2021.11.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (2023.6.0)\n","Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets) (3.8.4)\n","Requirement already satisfied: huggingface-hub<1.0.0,>=0.11.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (0.16.4)\n","Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from datasets) (23.1)\n","Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (6.0)\n","Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (23.1.0)\n","Requirement already satisfied: charset-normalizer<4.0,>=2.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (2.0.12)\n","Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (6.0.4)\n","Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (4.0.2)\n","Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.9.2)\n","Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.3.3)\n","Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.3.1)\n","Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0.0,>=0.11.0->datasets) (3.12.2)\n","Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0.0,>=0.11.0->datasets) (4.7.1)\n","Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->datasets) (1.26.16)\n","Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->datasets) (2023.5.7)\n","Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->datasets) (3.4)\n","Requirement already satisfied: python-dateutil>=2.8.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2.8.2)\n","Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2022.7.1)\n","Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.1->pandas->datasets) (1.16.0)\n","Installing collected packages: xxhash, dill, multiprocess, datasets\n","Successfully installed datasets-2.13.1 dill-0.3.6 multiprocess-0.70.14 xxhash-3.2.0\n","Collecting accelerate\n","  Downloading accelerate-0.21.0-py3-none-any.whl (244 kB)\n","\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m244.2/244.2 kB\u001b[0m \u001b[31m19.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from accelerate) (1.22.4)\n","Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from accelerate) (23.1)\n","Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate) (5.9.5)\n","Requirement already satisfied: pyyaml in /usr/local/lib/python3.10/dist-packages (from accelerate) (6.0)\n","Requirement already satisfied: torch>=1.10.0 in /usr/local/lib/python3.10/dist-packages (from accelerate) (2.0.1+cu118)\n","Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (3.12.2)\n","Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (4.7.1)\n","Requirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (1.11.1)\n","Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (3.1)\n","Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (3.1.2)\n","Requirement already satisfied: triton==2.0.0 in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (2.0.0)\n","Requirement already satisfied: cmake in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch>=1.10.0->accelerate) (3.25.2)\n","Requirement already satisfied: lit in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch>=1.10.0->accelerate) (16.0.6)\n","Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch>=1.10.0->accelerate) (2.1.3)\n","Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch>=1.10.0->accelerate) (1.3.0)\n","Installing collected packages: accelerate\n","Successfully installed accelerate-0.21.0\n"]}],"source":["!pip install transformers==4.28.0\n","!pip install datasets\n","!pip install accelerate -U"]},{"cell_type":"code","source":["!gdown 1a1v06PvGaWmTCWvL33o2C133D90SRzMC # download cw_texts_clean_bert.csv\n","!mkdir output\n","!mkdir /data\n","!mv cw_texts_clean_bert.csv /data"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"QvRTCsEPvVCY","executionInfo":{"status":"ok","timestamp":1689538330960,"user_tz":420,"elapsed":6462,"user":{"displayName":"Yu Wang","userId":"02802289530208391889"}},"outputId":"2131db9f-1662-4c97-888f-2bc9d28e5625"},"execution_count":2,"outputs":[{"output_type":"stream","name":"stdout","text":["Downloading...\n","From: https://drive.google.com/uc?id=1a1v06PvGaWmTCWvL33o2C133D90SRzMC\n","To: /content/cw_texts_clean_bert.csv\n","100% 59.5M/59.5M [00:01<00:00, 52.4MB/s]\n"]}]},{"cell_type":"code","source":["# the following lines (177 in total) are directly copied from Haffner et al. (2023), Political Analysis\n","import pandas as pd\n","from sklearn.model_selection import train_test_split\n","from datasets import Dataset\n","from transformers import AutoTokenizer, AutoModelForSequenceClassification\n","from sklearn.metrics import mean_absolute_error\n","from transformers import TrainingArguments, Trainer\n","import torch\n","import matplotlib.pyplot as plt\n","from sklearn.metrics import mean_squared_error\n","from sklearn.metrics import r2_score\n","from numpy.random import seed\n","from tqdm import tqdm\n","seed(1)\n","\n","final = pd.read_csv('/data/cw_texts_clean_bert.csv')\n","\n","print(len(final))\n","final['fatalities_log'] = final['fatalities_log'].astype(float)\n","\n","train = final[final['year'] < 2021]\n","train.reset_index(inplace=True, drop=True)\n","test = final[final['year'] == 2021]\n","test.reset_index(inplace=True, drop=True)\n","\n","train['split_dummy'] = ''\n","train['year'] = train['year'].astype(int)\n","train['month'] = train['month'].astype(int)\n","\n","for i in tqdm(range(len(train))):\n","    if train['year'][i] == 2020 and train['month'][i] > 6:\n","        train['split_dummy'][i] = 1\n","    else:\n","        train['split_dummy'][i] = 0\n","\n","train['split_dummy'].value_counts()\n","\n","train1 = train[train['split_dummy'] == 0]\n","vali = train[train['split_dummy'] == 1]\n","\n","X_train = train1['final_text']\n","y_train = train1['fatalities_log']\n","X_vali = vali['final_text']\n","y_vali = vali['fatalities_log']\n","X_test = test['final_text']\n","y_test = test['fatalities_log']\n","X_train = pd.DataFrame(X_train)\n","X_test = pd.DataFrame(X_test)\n","X_vali = pd.DataFrame(X_vali)\n","y_vali = pd.DataFrame(y_vali)\n","y_train = pd.DataFrame(y_train)\n","y_test = pd.DataFrame(y_test)\n","\n","df_train = pd.concat([X_train, y_train], axis=1)\n","df_val = pd.concat([X_vali, y_vali], axis=1)\n","df_test = pd.concat([X_test, y_test], axis=1)\n","\n","\n","raw_train_ds = Dataset.from_pandas(df_train)\n","raw_val_ds = Dataset.from_pandas(df_val)\n","raw_test_ds = Dataset.from_pandas(df_test)\n","\n","BASE_MODEL = \"snowood1/ConfliBERT-scr-uncased\"\n","LEARNING_RATE = 2e-5 # decreased from 2e-3\n","MAX_LENGTH = 256\n","BATCH_SIZE = 16\n","EPOCHS = 20\n","\n","tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL)\n","def model_init():\n","    model = AutoModelForSequenceClassification.from_pretrained(BASE_MODEL, num_labels=1, ignore_mismatched_sizes=True)\n","    # for param in model.bert.parameters():\n","    #     param.requires_grad = False\n","    return model\n","\n","\n","ds = {\"train\": raw_train_ds, \"validation\": raw_val_ds, \"test\": raw_test_ds}\n","\n","\n","def preprocess_function(examples):\n","    label = examples[\"fatalities_log\"]\n","    examples = tokenizer(examples[\"final_text\"], truncation=True, padding=\"max_length\", max_length=256)\n","\n","    # Change this to real number\n","    examples[\"label\"] = float(label)\n","    return examples\n","\n","\n","for split in ds:\n","    ds[split] = ds[split].map(preprocess_function)\n","\n","\n","def compute_metrics_for_regression(eval_pred):\n","    logits, labels = eval_pred\n","    labels = labels.reshape(-1, 1)\n","\n","    mse = mean_squared_error(labels, logits)\n","    mae = mean_absolute_error(labels, logits)\n","    r2 = r2_score(labels, logits)\n","    single_squared_errors = ((logits - labels).flatten() ** 2).tolist()\n","\n","    # Compute accuracy\n","    # Based on the fact that the rounded score = true score only if |single_squared_errors| < 0.5\n","    accuracy = sum([1 for e in single_squared_errors if e < 0.25]) / len(single_squared_errors)\n","\n","    return {\"mse\": mse, \"mae\": mae, \"r2\": r2, \"accuracy\": accuracy}\n","\n","training_args = TrainingArguments(\n","    output_dir=\"/data/output/conflibert\",\n","    learning_rate=LEARNING_RATE,\n","    per_device_train_batch_size=BATCH_SIZE,\n","    per_device_eval_batch_size=BATCH_SIZE,\n","    num_train_epochs=EPOCHS,\n","    evaluation_strategy=\"steps\",\n","    eval_steps=500,\n","    save_total_limit=10,\n","    load_best_model_at_end=True,\n","    weight_decay=0.01,\n","    seed=123\n",")\n","\n","class RegressionTrainer(Trainer):\n","    def compute_loss(self, model, inputs, return_outputs=False):\n","        labels = inputs.pop(\"labels\")\n","        outputs = model(**inputs)\n","        logits = outputs[0][:, 0]\n","        loss = torch.nn.functional.mse_loss(logits, labels)\n","        return (loss, outputs) if return_outputs else loss\n","\n","\n","trainer = RegressionTrainer(\n","    model_init=model_init,\n","    args=training_args,\n","    train_dataset=ds[\"train\"],\n","    eval_dataset=ds[\"validation\"],\n","    compute_metrics=compute_metrics_for_regression,\n",")\n","\n","trainer.train()\n","\n","for obj in trainer.state.log_history:\n","    print(obj)\n","\n","trainer.eval_dataset=ds[\"test\"]\n","trainer.evaluate()\n","\n","raw_pred_test, _, _ = trainer.predict(ds[\"test\"])\n","print(raw_pred_test[:20])\n","pd.DataFrame(raw_pred_test).to_csv('/data/cw_pred_test_zero.csv')\n","\n","df_results = pd.DataFrame(columns=['Test_MSE','Test_R2'], index=range(0,1))\n","mse = mean_squared_error(ds['test']['fatalities_log'], raw_pred_test)\n","r_squared = r2_score(ds['test']['fatalities_log'], raw_pred_test)\n","print(mse)\n","print(r_squared)\n","df_results['Test_MSE'][0] = mse\n","df_results['Test_R2'][0] = r_squared\n","df_results.to_csv('/data/bert_metrics.csv', index=False)\n","\n","## Whole CW\n","print('Now whole corpus')\n","raw_train1_ds = Dataset.from_pandas(final)\n","ds = {\"test\": raw_train1_ds}\n","\n","## Create dataset\n","\n","for split in ds:\n","    ds[split] = ds[split].map(preprocess_function)\n","\n","print('Now predicting')\n","raw_pred, _, _ = trainer.predict(ds[\"test\"])\n","print(raw_pred[:20])\n","pd.DataFrame(raw_pred).to_csv('/data/cw_bert_pred_zero.csv')\n","\n","print('DF saved')\n","\n","trainer.eval_dataset=ds[\"test\"]\n","trainer.evaluate()"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":1000,"referenced_widgets":["fa0e7bbe536e472e9991d863b102f15a","01c27f695e3b470fba5238e264e4ad07","20762690419a448eaf47b1cb70530055","7d512d43a0e64302ac129fe66cba6ee1","8731d4e7053c490c8a9c5c6860a4e8fb","7bffbeb0ad304836b96f54e02285aaee","ad874c3f37f246d2a8005a93bc4a85b6","6ef83f585f3f4f68bc659040a4bea134","fbe3297c1ca64ccc85a5326a93e40259","edf64acf2d614d018e9f4a16261c4adc","a8b86a8c5a75478d92cc8a071bc74bbe","3bbe895893e148f9896676a31a88f3fc","09f9d26f420f4dec84ba34f11b80b73f","7c4799db0f364ac5baa8a7987b44149a","be1640e664c44df7b6fd0549fb12a4c3","355ab8d20c0f43b4bda4ed533a4edcd3","57f36ed86b6c4809971337eaa8d964a3","eac29d2974604951ba63f8e65675172e","ed19c56b20ba4cc088e85a25bf1d1e4e","5ab8f35107cd49df9e2fe7d17ccc0a42","a1616fad62924db78e443a8b93047265","5510ec05edc14e43a994498161bae651","ec32948c16b3443d8db3bf12a098c15a","5abe34cfd1df41d093a1c1d4b62388a6","e41f1757c1d9492da1d9c8f6e80d4874","b143d106dda74054bf568f5490099766","f21140dc2d85407ea2a487b93aacbc5b","7062c6b8509543bc97d15efb009b98e2","cf3493e5beb2455a9e2c92e670ab7c06","5dfd63859f784b09b0ab43fe51b616b0","28fd7936d80a49fa811210d21baeaf75","b4eeb0aca28d41dd813f389b654b88b8","5b7c1ed7646d4bd0bca9005d3000fd4b","618482e958f74bac8e637341c5ebc441","cf10d626a08647dcaf12bb0d2425277c","5ca5da6e43e24c0a98053c8201b1fe7d","5e829560c52849e187db0ed094acdf0a","1a7842e0efa24abeba6e1675583b8dd7","adc12fc45aaf48c6bcb24c8238abf300","a19c0cf31c3c4aeeb336c28cfc6762bb","f8e885cca8144136a341edb9dcf53f95","b526ff073a844b259458d5abc24665d4","d7e3906709ef4ef1a6d20d5edb9c5bd3","07b2452e6b3c406581d8405ed29dbfc2","a0a5467f1be14cf9b271995c8467d98c","90f480c849604618802a970439c004a3","c8694078b30c46af824862c6d5604e26","6eecdb3ddbca44e889995bba4143083a","d115a88dc64248c990319b2b2a95367a","264e8dd132844f55b69841415a8b819d","94e0cb53a5324b17965b40f76ddf5f48","680058a58f0747e58ccee1c3f59b5d43","5c23b40e9f2d4797840683184078a693","5c9ae4a0298c44ab881a5fac1e6be3e7","99eb5ff7212b4bf9ada29956e7327fcd","ea15658f530a40a0a3ee74d76c415b95","3d7d2ab0105d446db11421900ff92908","aa6b7143dbda4165805f21e9b47119d0","c9db5f9857414a518e58127bbf331d58","717c53fc2a8c47e6a85428b6c2f13b0d","836a82a00fee45c5bdb807b632a6fd18","949b5d5e19ac4058a6c3aae95f147d0f","868c8bb1089f45d9b49817017ad1fa39","73b7d4338ce241fca51d26baf1a7c94c","ae28dc20466446b6ba1fae25ab31e22b","f224a49d51d3485d9173ad23ee7a8fa3","b6930f727faf4af5ac6103f34a0728a3","7e4d704ccfbb413aac17080649470991","a950da66aac144b2a2e98d7861b63fa1","689c1e20ba9342dca8a7a8806fdcae8f","19898c6fdb57427a80263af18f762c22","4dab1258e1b44bc99d2714b00b89aa2f","5138c07602404491adbd286a0ac19bb6","97133fcbd22e4f6d835ad29b8517a3d0","adeb4ca8368c4f64a451ba708c8614f2","df8e65d254d44e1cb4147514915fbb30","5df370321ba244e0b778790e8a2d9a10","ac678daee17c4572a15387f65cf3a2e6","5263dc3f385a450eb304e909dd53d37e","1acac7477f36498a8763ce3aca41975e","6bfeb527c31c4741945917d4243246cc","fa6fd522a99e46e0a10ca64f4aa6d6cb","e171724c11814192bf84273c89402b34","64e6581e50e84e8685e5a4db09c5cbfd","e1a3c9180cab45a489a2d17a34b0eb5c","0a22ab96872644c09c079521ff278772","7568c3a49c0b4d349e36348c72dd1d10","00a4100953824e36a5a74585539d4aba","3d4245e6a02745e49da814c0d21d50f0","0cb68ca00dd343dd9488f0ef41ac9177","4753e3cf5f114096a7a2acde48b117ea","3ea79cb1ee8646019cce3e161c0d57b1","b9524ffbcb6c449cba0ed72640bfb8e1","45343b2d50c846d09329377d993eec4e","5896c18516fe46f6bab83d226cfa2fee","6a3f4f35966444cda8a127373bbec506","b86e8c343bd24eee83256ed92f91561d","0396ab496b2b4819aaa6b4e5a8f85078","62ab062e6d424c45aca01945e179070c","9a905030128747dda71e544a218f83c1","2cff427ff3ef4e6982d2dfbd9232d0c3","a3f94b85301b491886a9f83b16aeac63","4a8472d9c15443039b3053e96a6a6d41","8e459af962f14b41bf8c992c5f3ab411","4deb011fc31e44b88c800d91e5f6a93d","e5da6ee403d040cbb2faba0a8bd81d22","a79e7053b6aa438bbfc03539a5ce95af","320e848473244e59aef9b1e400b09f1b","a13768a4c8894e2d88ea4ec1afd46bd2","f556bf7e32ba407199f139746e5415ff"]},"id":"_UUtlbRAySQ_","outputId":"62cf0657-fce0-4ea1-fdf9-de57e103085a","executionInfo":{"status":"ok","timestamp":1689544062035,"user_tz":420,"elapsed":5731079,"user":{"displayName":"Yu Wang","userId":"02802289530208391889"}}},"execution_count":3,"outputs":[{"output_type":"stream","name":"stderr","text":["<ipython-input-3-bba54cbd4740>:26: SettingWithCopyWarning: \n","A value is trying to be set on a copy of a slice from a DataFrame.\n","Try using .loc[row_indexer,col_indexer] = value instead\n","\n","See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n","  train['split_dummy'] = ''\n","<ipython-input-3-bba54cbd4740>:27: SettingWithCopyWarning: \n","A value is trying to be set on a copy of a slice from a DataFrame.\n","Try using .loc[row_indexer,col_indexer] = value instead\n","\n","See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n","  train['year'] = train['year'].astype(int)\n","<ipython-input-3-bba54cbd4740>:28: SettingWithCopyWarning: \n","A value is trying to be set on a copy of a slice from a DataFrame.\n","Try using .loc[row_indexer,col_indexer] = value instead\n","\n","See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n","  train['month'] = train['month'].astype(int)\n"]},{"output_type":"stream","name":"stdout","text":["23868\n"]},{"output_type":"stream","name":"stderr","text":["  0%|          | 0/22572 [00:00<?, ?it/s]<ipython-input-3-bba54cbd4740>:34: SettingWithCopyWarning: \n","A value is trying to be set on a copy of a slice from a DataFrame\n","\n","See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n","  train['split_dummy'][i] = 0\n","<ipython-input-3-bba54cbd4740>:32: SettingWithCopyWarning: \n","A value is trying to be set on a copy of a slice from a DataFrame\n","\n","See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n","  train['split_dummy'][i] = 1\n","100%|██████████| 22572/22572 [00:07<00:00, 3111.60it/s]\n"]},{"output_type":"display_data","data":{"text/plain":["Downloading (…)okenizer_config.json:   0%|          | 0.00/270 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"fa0e7bbe536e472e9991d863b102f15a"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)lve/main/config.json:   0%|          | 0.00/570 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"3bbe895893e148f9896676a31a88f3fc"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)solve/main/vocab.txt:   0%|          | 0.00/224k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"ec32948c16b3443d8db3bf12a098c15a"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)/main/tokenizer.json:   0%|          | 0.00/454k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"618482e958f74bac8e637341c5ebc441"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)cial_tokens_map.json:   0%|          | 0.00/112 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"a0a5467f1be14cf9b271995c8467d98c"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Map:   0%|          | 0/21924 [00:00<?, ? examples/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"ea15658f530a40a0a3ee74d76c415b95"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Map:   0%|          | 0/648 [00:00<?, ? examples/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"b6930f727faf4af5ac6103f34a0728a3"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Map:   0%|          | 0/1296 [00:00<?, ? examples/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"ac678daee17c4572a15387f65cf3a2e6"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading pytorch_model.bin:   0%|          | 0.00/437M [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"3d4245e6a02745e49da814c0d21d50f0"}},"metadata":{}},{"output_type":"stream","name":"stderr","text":["Some weights of the model checkpoint at snowood1/ConfliBERT-scr-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.transform.dense.bias', 'cls.predictions.bias', 'cls.predictions.decoder.bias', 'cls.predictions.decoder.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight']\n","- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n","- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n","Some weights of BertForSequenceClassification were not initialized from the model checkpoint at snowood1/ConfliBERT-scr-uncased and are newly initialized: ['classifier.weight', 'bert.pooler.dense.weight', 'bert.pooler.dense.bias', 'classifier.bias']\n","You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n","Some weights of the model checkpoint at snowood1/ConfliBERT-scr-uncased were not used when initializing BertForSequenceClassification: ['cls.predictions.transform.dense.bias', 'cls.predictions.bias', 'cls.predictions.decoder.bias', 'cls.predictions.decoder.weight', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight']\n","- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n","- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n","Some weights of BertForSequenceClassification were not initialized from the model checkpoint at snowood1/ConfliBERT-scr-uncased and are newly initialized: ['classifier.weight', 'bert.pooler.dense.weight', 'bert.pooler.dense.bias', 'classifier.bias']\n","You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n","/usr/local/lib/python3.10/dist-packages/transformers/optimization.py:391: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n","  warnings.warn(\n"]},{"output_type":"display_data","data":{"text/plain":["<IPython.core.display.HTML object>"],"text/html":["\n","    <div>\n","      \n","      <progress value='27420' max='27420' style='width:300px; height:20px; vertical-align: middle;'></progress>\n","      [27420/27420 1:30:43, Epoch 20/20]\n","    </div>\n","    <table border=\"1\" class=\"dataframe\">\n","  <thead>\n"," <tr style=\"text-align: left;\">\n","      <th>Step</th>\n","      <th>Training Loss</th>\n","      <th>Validation Loss</th>\n","      <th>Mse</th>\n","      <th>Mae</th>\n","      <th>R2</th>\n","      <th>Accuracy</th>\n","    </tr>\n","  </thead>\n","  <tbody>\n","    <tr>\n","      <td>500</td>\n","      <td>1.360600</td>\n","      <td>1.326622</td>\n","      <td>1.326622</td>\n","      <td>0.644018</td>\n","      <td>0.661316</td>\n","      <td>0.665123</td>\n","    </tr>\n","    <tr>\n","      <td>1000</td>\n","      <td>0.905900</td>\n","      <td>1.213927</td>\n","      <td>1.213927</td>\n","      <td>0.631564</td>\n","      <td>0.690087</td>\n","      <td>0.695988</td>\n","    </tr>\n","    <tr>\n","      <td>1500</td>\n","      <td>0.847100</td>\n","      <td>1.252758</td>\n","      <td>1.252758</td>\n","      <td>0.623503</td>\n","      <td>0.680173</td>\n","      <td>0.691358</td>\n","    </tr>\n","    <tr>\n","      <td>2000</td>\n","      <td>0.650700</td>\n","      <td>1.182552</td>\n","      <td>1.182552</td>\n","      <td>0.632839</td>\n","      <td>0.698097</td>\n","      <td>0.706790</td>\n","    </tr>\n","    <tr>\n","      <td>2500</td>\n","      <td>0.661600</td>\n","      <td>0.924235</td>\n","      <td>0.924235</td>\n","      <td>0.496174</td>\n","      <td>0.764045</td>\n","      <td>0.723765</td>\n","    </tr>\n","    <tr>\n","      <td>3000</td>\n","      <td>0.650700</td>\n","      <td>1.279254</td>\n","      <td>1.279254</td>\n","      <td>0.621488</td>\n","      <td>0.673409</td>\n","      <td>0.677469</td>\n","    </tr>\n","    <tr>\n","      <td>3500</td>\n","      <td>0.575700</td>\n","      <td>1.065378</td>\n","      <td>1.065378</td>\n","      <td>0.520373</td>\n","      <td>0.728011</td>\n","      <td>0.726852</td>\n","    </tr>\n","    <tr>\n","      <td>4000</td>\n","      <td>0.525100</td>\n","      <td>0.981259</td>\n","      <td>0.981259</td>\n","      <td>0.513048</td>\n","      <td>0.749487</td>\n","      <td>0.706790</td>\n","    </tr>\n","    <tr>\n","      <td>4500</td>\n","      <td>0.442000</td>\n","      <td>1.020506</td>\n","      <td>1.020506</td>\n","      <td>0.666045</td>\n","      <td>0.739467</td>\n","      <td>0.679012</td>\n","    </tr>\n","    <tr>\n","      <td>5000</td>\n","      <td>0.484900</td>\n","      <td>0.970342</td>\n","      <td>0.970342</td>\n","      <td>0.518802</td>\n","      <td>0.752274</td>\n","      <td>0.731481</td>\n","    </tr>\n","    <tr>\n","      <td>5500</td>\n","      <td>0.473100</td>\n","      <td>1.037266</td>\n","      <td>1.037266</td>\n","      <td>0.512102</td>\n","      <td>0.735188</td>\n","      <td>0.726852</td>\n","    </tr>\n","    <tr>\n","      <td>6000</td>\n","      <td>0.399000</td>\n","      <td>1.000108</td>\n","      <td>1.000108</td>\n","      <td>0.507818</td>\n","      <td>0.744674</td>\n","      <td>0.734568</td>\n","    </tr>\n","    <tr>\n","      <td>6500</td>\n","      <td>0.401400</td>\n","      <td>0.921212</td>\n","      <td>0.921212</td>\n","      <td>0.480386</td>\n","      <td>0.764816</td>\n","      <td>0.722222</td>\n","    </tr>\n","    <tr>\n","      <td>7000</td>\n","      <td>0.397800</td>\n","      <td>1.002888</td>\n","      <td>1.002888</td>\n","      <td>0.471389</td>\n","      <td>0.743965</td>\n","      <td>0.743827</td>\n","    </tr>\n","    <tr>\n","      <td>7500</td>\n","      <td>0.340100</td>\n","      <td>0.963183</td>\n","      <td>0.963183</td>\n","      <td>0.473426</td>\n","      <td>0.754101</td>\n","      <td>0.717593</td>\n","    </tr>\n","    <tr>\n","      <td>8000</td>\n","      <td>0.350700</td>\n","      <td>0.932367</td>\n","      <td>0.932367</td>\n","      <td>0.475609</td>\n","      <td>0.761968</td>\n","      <td>0.731481</td>\n","    </tr>\n","    <tr>\n","      <td>8500</td>\n","      <td>0.343400</td>\n","      <td>0.990344</td>\n","      <td>0.990344</td>\n","      <td>0.540053</td>\n","      <td>0.747167</td>\n","      <td>0.717593</td>\n","    </tr>\n","    <tr>\n","      <td>9000</td>\n","      <td>0.320900</td>\n","      <td>0.932563</td>\n","      <td>0.932563</td>\n","      <td>0.468170</td>\n","      <td>0.761918</td>\n","      <td>0.725309</td>\n","    </tr>\n","    <tr>\n","      <td>9500</td>\n","      <td>0.317500</td>\n","      <td>0.938374</td>\n","      <td>0.938374</td>\n","      <td>0.500528</td>\n","      <td>0.760435</td>\n","      <td>0.742284</td>\n","    </tr>\n","    <tr>\n","      <td>10000</td>\n","      <td>0.311500</td>\n","      <td>0.892150</td>\n","      <td>0.892150</td>\n","      <td>0.458372</td>\n","      <td>0.772236</td>\n","      <td>0.733025</td>\n","    </tr>\n","    <tr>\n","      <td>10500</td>\n","      <td>0.286100</td>\n","      <td>0.958611</td>\n","      <td>0.958611</td>\n","      <td>0.496246</td>\n","      <td>0.755268</td>\n","      <td>0.734568</td>\n","    </tr>\n","    <tr>\n","      <td>11000</td>\n","      <td>0.303900</td>\n","      <td>0.978709</td>\n","      <td>0.978709</td>\n","      <td>0.510331</td>\n","      <td>0.750137</td>\n","      <td>0.731481</td>\n","    </tr>\n","    <tr>\n","      <td>11500</td>\n","      <td>0.289500</td>\n","      <td>0.948435</td>\n","      <td>0.948435</td>\n","      <td>0.470045</td>\n","      <td>0.757866</td>\n","      <td>0.739198</td>\n","    </tr>\n","    <tr>\n","      <td>12000</td>\n","      <td>0.282800</td>\n","      <td>0.919103</td>\n","      <td>0.919103</td>\n","      <td>0.491260</td>\n","      <td>0.765355</td>\n","      <td>0.742284</td>\n","    </tr>\n","    <tr>\n","      <td>12500</td>\n","      <td>0.274600</td>\n","      <td>0.934732</td>\n","      <td>0.934732</td>\n","      <td>0.471789</td>\n","      <td>0.761365</td>\n","      <td>0.736111</td>\n","    </tr>\n","    <tr>\n","      <td>13000</td>\n","      <td>0.251000</td>\n","      <td>0.943295</td>\n","      <td>0.943295</td>\n","      <td>0.479464</td>\n","      <td>0.759179</td>\n","      <td>0.726852</td>\n","    </tr>\n","    <tr>\n","      <td>13500</td>\n","      <td>0.286700</td>\n","      <td>0.909103</td>\n","      <td>0.909103</td>\n","      <td>0.454541</td>\n","      <td>0.767908</td>\n","      <td>0.745370</td>\n","    </tr>\n","    <tr>\n","      <td>14000</td>\n","      <td>0.284100</td>\n","      <td>0.935878</td>\n","      <td>0.935878</td>\n","      <td>0.464076</td>\n","      <td>0.761072</td>\n","      <td>0.743827</td>\n","    </tr>\n","    <tr>\n","      <td>14500</td>\n","      <td>0.248900</td>\n","      <td>0.962047</td>\n","      <td>0.962047</td>\n","      <td>0.480699</td>\n","      <td>0.754391</td>\n","      <td>0.743827</td>\n","    </tr>\n","    <tr>\n","      <td>15000</td>\n","      <td>0.267100</td>\n","      <td>0.937032</td>\n","      <td>0.937032</td>\n","      <td>0.482391</td>\n","      <td>0.760778</td>\n","      <td>0.729938</td>\n","    </tr>\n","    <tr>\n","      <td>15500</td>\n","      <td>0.225100</td>\n","      <td>0.923875</td>\n","      <td>0.923875</td>\n","      <td>0.459116</td>\n","      <td>0.764137</td>\n","      <td>0.737654</td>\n","    </tr>\n","    <tr>\n","      <td>16000</td>\n","      <td>0.256400</td>\n","      <td>0.943426</td>\n","      <td>0.943427</td>\n","      <td>0.470725</td>\n","      <td>0.759145</td>\n","      <td>0.748457</td>\n","    </tr>\n","    <tr>\n","      <td>16500</td>\n","      <td>0.280200</td>\n","      <td>0.965545</td>\n","      <td>0.965545</td>\n","      <td>0.475132</td>\n","      <td>0.753498</td>\n","      <td>0.722222</td>\n","    </tr>\n","    <tr>\n","      <td>17000</td>\n","      <td>0.256200</td>\n","      <td>0.914998</td>\n","      <td>0.914997</td>\n","      <td>0.455914</td>\n","      <td>0.766403</td>\n","      <td>0.743827</td>\n","    </tr>\n","    <tr>\n","      <td>17500</td>\n","      <td>0.234500</td>\n","      <td>0.924370</td>\n","      <td>0.924370</td>\n","      <td>0.460531</td>\n","      <td>0.764010</td>\n","      <td>0.751543</td>\n","    </tr>\n","    <tr>\n","      <td>18000</td>\n","      <td>0.233100</td>\n","      <td>0.935030</td>\n","      <td>0.935030</td>\n","      <td>0.466955</td>\n","      <td>0.761289</td>\n","      <td>0.728395</td>\n","    </tr>\n","    <tr>\n","      <td>18500</td>\n","      <td>0.260700</td>\n","      <td>0.915799</td>\n","      <td>0.915799</td>\n","      <td>0.460970</td>\n","      <td>0.766198</td>\n","      <td>0.736111</td>\n","    </tr>\n","    <tr>\n","      <td>19000</td>\n","      <td>0.248200</td>\n","      <td>0.872648</td>\n","      <td>0.872648</td>\n","      <td>0.445931</td>\n","      <td>0.777215</td>\n","      <td>0.750000</td>\n","    </tr>\n","    <tr>\n","      <td>19500</td>\n","      <td>0.240900</td>\n","      <td>0.909036</td>\n","      <td>0.909036</td>\n","      <td>0.485277</td>\n","      <td>0.767925</td>\n","      <td>0.739198</td>\n","    </tr>\n","    <tr>\n","      <td>20000</td>\n","      <td>0.199100</td>\n","      <td>0.912820</td>\n","      <td>0.912820</td>\n","      <td>0.455910</td>\n","      <td>0.766959</td>\n","      <td>0.740741</td>\n","    </tr>\n","    <tr>\n","      <td>20500</td>\n","      <td>0.252500</td>\n","      <td>0.913583</td>\n","      <td>0.913583</td>\n","      <td>0.456692</td>\n","      <td>0.766764</td>\n","      <td>0.737654</td>\n","    </tr>\n","    <tr>\n","      <td>21000</td>\n","      <td>0.259900</td>\n","      <td>0.906944</td>\n","      <td>0.906944</td>\n","      <td>0.505572</td>\n","      <td>0.768459</td>\n","      <td>0.743827</td>\n","    </tr>\n","    <tr>\n","      <td>21500</td>\n","      <td>0.241700</td>\n","      <td>0.904064</td>\n","      <td>0.904064</td>\n","      <td>0.450724</td>\n","      <td>0.769194</td>\n","      <td>0.742284</td>\n","    </tr>\n","    <tr>\n","      <td>22000</td>\n","      <td>0.196200</td>\n","      <td>0.929082</td>\n","      <td>0.929082</td>\n","      <td>0.460261</td>\n","      <td>0.762807</td>\n","      <td>0.740741</td>\n","    </tr>\n","    <tr>\n","      <td>22500</td>\n","      <td>0.233700</td>\n","      <td>0.899421</td>\n","      <td>0.899421</td>\n","      <td>0.447975</td>\n","      <td>0.770380</td>\n","      <td>0.745370</td>\n","    </tr>\n","    <tr>\n","      <td>23000</td>\n","      <td>0.233200</td>\n","      <td>0.907124</td>\n","      <td>0.907124</td>\n","      <td>0.449682</td>\n","      <td>0.768413</td>\n","      <td>0.742284</td>\n","    </tr>\n","    <tr>\n","      <td>23500</td>\n","      <td>0.220500</td>\n","      <td>0.907685</td>\n","      <td>0.907685</td>\n","      <td>0.467251</td>\n","      <td>0.768270</td>\n","      <td>0.745370</td>\n","    </tr>\n","    <tr>\n","      <td>24000</td>\n","      <td>0.211700</td>\n","      <td>0.926664</td>\n","      <td>0.926664</td>\n","      <td>0.456733</td>\n","      <td>0.763424</td>\n","      <td>0.737654</td>\n","    </tr>\n","    <tr>\n","      <td>24500</td>\n","      <td>0.260900</td>\n","      <td>0.922859</td>\n","      <td>0.922859</td>\n","      <td>0.454164</td>\n","      <td>0.764396</td>\n","      <td>0.736111</td>\n","    </tr>\n","    <tr>\n","      <td>25000</td>\n","      <td>0.223700</td>\n","      <td>0.899206</td>\n","      <td>0.899206</td>\n","      <td>0.458103</td>\n","      <td>0.770434</td>\n","      <td>0.743827</td>\n","    </tr>\n","    <tr>\n","      <td>25500</td>\n","      <td>0.244500</td>\n","      <td>0.903693</td>\n","      <td>0.903693</td>\n","      <td>0.460845</td>\n","      <td>0.769289</td>\n","      <td>0.745370</td>\n","    </tr>\n","    <tr>\n","      <td>26000</td>\n","      <td>0.193000</td>\n","      <td>0.912548</td>\n","      <td>0.912548</td>\n","      <td>0.445913</td>\n","      <td>0.767028</td>\n","      <td>0.745370</td>\n","    </tr>\n","    <tr>\n","      <td>26500</td>\n","      <td>0.209500</td>\n","      <td>0.898440</td>\n","      <td>0.898440</td>\n","      <td>0.459594</td>\n","      <td>0.770630</td>\n","      <td>0.743827</td>\n","    </tr>\n","    <tr>\n","      <td>27000</td>\n","      <td>0.231900</td>\n","      <td>0.908017</td>\n","      <td>0.908017</td>\n","      <td>0.445089</td>\n","      <td>0.768185</td>\n","      <td>0.745370</td>\n","    </tr>\n","  </tbody>\n","</table><p>"]},"metadata":{}},{"output_type":"stream","name":"stdout","text":["{'loss': 1.3606, 'learning_rate': 1.963530269876003e-05, 'epoch': 0.36, 'step': 500}\n","{'eval_loss': 1.3266222476959229, 'eval_mse': 1.3266222476959229, 'eval_mae': 0.6440179944038391, 'eval_r2': 0.6613159635178982, 'eval_accuracy': 0.6651234567901234, 'eval_runtime': 2.5284, 'eval_samples_per_second': 256.289, 'eval_steps_per_second': 16.216, 'epoch': 0.36, 'step': 500}\n","{'loss': 0.9059, 'learning_rate': 1.927060539752006e-05, 'epoch': 0.73, 'step': 1000}\n","{'eval_loss': 1.2139272689819336, 'eval_mse': 1.2139272689819336, 'eval_mae': 0.6315637230873108, 'eval_r2': 0.6900867974105013, 'eval_accuracy': 0.6959876543209876, 'eval_runtime': 2.5296, 'eval_samples_per_second': 256.165, 'eval_steps_per_second': 16.208, 'epoch': 0.73, 'step': 1000}\n","{'loss': 0.8471, 'learning_rate': 1.890590809628009e-05, 'epoch': 1.09, 'step': 1500}\n","{'eval_loss': 1.2527580261230469, 'eval_mse': 1.2527579069137573, 'eval_mae': 0.6235031485557556, 'eval_r2': 0.6801733944856283, 'eval_accuracy': 0.691358024691358, 'eval_runtime': 2.539, 'eval_samples_per_second': 255.214, 'eval_steps_per_second': 16.148, 'epoch': 1.09, 'step': 1500}\n","{'loss': 0.6507, 'learning_rate': 1.854121079504012e-05, 'epoch': 1.46, 'step': 2000}\n","{'eval_loss': 1.1825522184371948, 'eval_mse': 1.1825522184371948, 'eval_mae': 0.6328388452529907, 'eval_r2': 0.6980967987182833, 'eval_accuracy': 0.7067901234567902, 'eval_runtime': 2.5291, 'eval_samples_per_second': 256.214, 'eval_steps_per_second': 16.211, 'epoch': 1.46, 'step': 2000}\n","{'loss': 0.6616, 'learning_rate': 1.8176513493800147e-05, 'epoch': 1.82, 'step': 2500}\n","{'eval_loss': 0.9242345690727234, 'eval_mse': 0.9242345690727234, 'eval_mae': 0.49617353081703186, 'eval_r2': 0.7640447854555873, 'eval_accuracy': 0.7237654320987654, 'eval_runtime': 2.5303, 'eval_samples_per_second': 256.101, 'eval_steps_per_second': 16.204, 'epoch': 1.82, 'step': 2500}\n","{'loss': 0.6507, 'learning_rate': 1.7811816192560176e-05, 'epoch': 2.19, 'step': 3000}\n","{'eval_loss': 1.2792540788650513, 'eval_mse': 1.2792540788650513, 'eval_mae': 0.6214882135391235, 'eval_r2': 0.6734089771262252, 'eval_accuracy': 0.6774691358024691, 'eval_runtime': 2.527, 'eval_samples_per_second': 256.427, 'eval_steps_per_second': 16.225, 'epoch': 2.19, 'step': 3000}\n","{'loss': 0.5757, 'learning_rate': 1.7447118891320204e-05, 'epoch': 2.55, 'step': 3500}\n","{'eval_loss': 1.0653777122497559, 'eval_mse': 1.0653778314590454, 'eval_mae': 0.5203731060028076, 'eval_r2': 0.7280111920072116, 'eval_accuracy': 0.7268518518518519, 'eval_runtime': 2.5274, 'eval_samples_per_second': 256.393, 'eval_steps_per_second': 16.222, 'epoch': 2.55, 'step': 3500}\n","{'loss': 0.5251, 'learning_rate': 1.7082421590080233e-05, 'epoch': 2.92, 'step': 4000}\n","{'eval_loss': 0.9812591671943665, 'eval_mse': 0.9812591671943665, 'eval_mae': 0.5130482912063599, 'eval_r2': 0.7494865011741172, 'eval_accuracy': 0.7067901234567902, 'eval_runtime': 2.5325, 'eval_samples_per_second': 255.871, 'eval_steps_per_second': 16.189, 'epoch': 2.92, 'step': 4000}\n","{'loss': 0.442, 'learning_rate': 1.6717724288840264e-05, 'epoch': 3.28, 'step': 4500}\n","{'eval_loss': 1.0205059051513672, 'eval_mse': 1.0205059051513672, 'eval_mae': 0.6660449504852295, 'eval_r2': 0.7394668733787564, 'eval_accuracy': 0.6790123456790124, 'eval_runtime': 2.5326, 'eval_samples_per_second': 255.859, 'eval_steps_per_second': 16.189, 'epoch': 3.28, 'step': 4500}\n","{'loss': 0.4849, 'learning_rate': 1.6353026987600293e-05, 'epoch': 3.65, 'step': 5000}\n","{'eval_loss': 0.9703423976898193, 'eval_mse': 0.9703422784805298, 'eval_mae': 0.518801748752594, 'eval_r2': 0.7522735364823493, 'eval_accuracy': 0.7314814814814815, 'eval_runtime': 2.5389, 'eval_samples_per_second': 255.232, 'eval_steps_per_second': 16.149, 'epoch': 3.65, 'step': 5000}\n","{'loss': 0.4731, 'learning_rate': 1.598832968636032e-05, 'epoch': 4.01, 'step': 5500}\n","{'eval_loss': 1.0372655391693115, 'eval_mse': 1.0372657775878906, 'eval_mae': 0.5121023654937744, 'eval_r2': 0.7351881611327448, 'eval_accuracy': 0.7268518518518519, 'eval_runtime': 2.5304, 'eval_samples_per_second': 256.084, 'eval_steps_per_second': 16.203, 'epoch': 4.01, 'step': 5500}\n","{'loss': 0.399, 'learning_rate': 1.562363238512035e-05, 'epoch': 4.38, 'step': 6000}\n","{'eval_loss': 1.000108242034912, 'eval_mse': 1.000108242034912, 'eval_mae': 0.507818341255188, 'eval_r2': 0.7446743675979486, 'eval_accuracy': 0.7345679012345679, 'eval_runtime': 2.5275, 'eval_samples_per_second': 256.38, 'eval_steps_per_second': 16.222, 'epoch': 4.38, 'step': 6000}\n","{'loss': 0.4014, 'learning_rate': 1.5258935083880378e-05, 'epoch': 4.74, 'step': 6500}\n","{'eval_loss': 0.9212120771408081, 'eval_mse': 0.9212121963500977, 'eval_mae': 0.4803858697414398, 'eval_r2': 0.7648163741981616, 'eval_accuracy': 0.7222222222222222, 'eval_runtime': 2.5262, 'eval_samples_per_second': 256.51, 'eval_steps_per_second': 16.23, 'epoch': 4.74, 'step': 6500}\n","{'loss': 0.3978, 'learning_rate': 1.489423778264041e-05, 'epoch': 5.11, 'step': 7000}\n","{'eval_loss': 1.0028882026672363, 'eval_mse': 1.0028882026672363, 'eval_mae': 0.47138914465904236, 'eval_r2': 0.743964624769309, 'eval_accuracy': 0.7438271604938271, 'eval_runtime': 2.5462, 'eval_samples_per_second': 254.494, 'eval_steps_per_second': 16.102, 'epoch': 5.11, 'step': 7000}\n","{'loss': 0.3401, 'learning_rate': 1.452954048140044e-05, 'epoch': 5.47, 'step': 7500}\n","{'eval_loss': 0.9631833434104919, 'eval_mse': 0.9631834626197815, 'eval_mae': 0.47342631220817566, 'eval_r2': 0.7541011955420249, 'eval_accuracy': 0.7175925925925926, 'eval_runtime': 2.5314, 'eval_samples_per_second': 255.984, 'eval_steps_per_second': 16.197, 'epoch': 5.47, 'step': 7500}\n","{'loss': 0.3507, 'learning_rate': 1.4164843180160469e-05, 'epoch': 5.84, 'step': 8000}\n","{'eval_loss': 0.9323673844337463, 'eval_mse': 0.9323673844337463, 'eval_mae': 0.4756087362766266, 'eval_r2': 0.7619684768426419, 'eval_accuracy': 0.7314814814814815, 'eval_runtime': 2.5169, 'eval_samples_per_second': 257.463, 'eval_steps_per_second': 16.29, 'epoch': 5.84, 'step': 8000}\n","{'loss': 0.3434, 'learning_rate': 1.3800145878920497e-05, 'epoch': 6.2, 'step': 8500}\n","{'eval_loss': 0.9903438091278076, 'eval_mse': 0.9903438091278076, 'eval_mae': 0.5400528907775879, 'eval_r2': 0.7471672074984563, 'eval_accuracy': 0.7175925925925926, 'eval_runtime': 2.5178, 'eval_samples_per_second': 257.367, 'eval_steps_per_second': 16.284, 'epoch': 6.2, 'step': 8500}\n","{'loss': 0.3209, 'learning_rate': 1.3435448577680525e-05, 'epoch': 6.56, 'step': 9000}\n","{'eval_loss': 0.9325634837150574, 'eval_mse': 0.9325634837150574, 'eval_mae': 0.468170166015625, 'eval_r2': 0.7619184276797051, 'eval_accuracy': 0.7253086419753086, 'eval_runtime': 2.5144, 'eval_samples_per_second': 257.715, 'eval_steps_per_second': 16.306, 'epoch': 6.56, 'step': 9000}\n","{'loss': 0.3175, 'learning_rate': 1.3070751276440557e-05, 'epoch': 6.93, 'step': 9500}\n","{'eval_loss': 0.9383742809295654, 'eval_mse': 0.9383742809295654, 'eval_mae': 0.5005282163619995, 'eval_r2': 0.7604349328404139, 'eval_accuracy': 0.7422839506172839, 'eval_runtime': 2.504, 'eval_samples_per_second': 258.784, 'eval_steps_per_second': 16.374, 'epoch': 6.93, 'step': 9500}\n","{'loss': 0.3115, 'learning_rate': 1.2706053975200586e-05, 'epoch': 7.29, 'step': 10000}\n","{'eval_loss': 0.8921498656272888, 'eval_mse': 0.8921498656272888, 'eval_mae': 0.45837152004241943, 'eval_r2': 0.7722359264759189, 'eval_accuracy': 0.7330246913580247, 'eval_runtime': 2.5083, 'eval_samples_per_second': 258.34, 'eval_steps_per_second': 16.346, 'epoch': 7.29, 'step': 10000}\n","{'loss': 0.2861, 'learning_rate': 1.2341356673960614e-05, 'epoch': 7.66, 'step': 10500}\n","{'eval_loss': 0.9586113691329956, 'eval_mse': 0.9586113691329956, 'eval_mae': 0.496246337890625, 'eval_r2': 0.755268452246405, 'eval_accuracy': 0.7345679012345679, 'eval_runtime': 2.5199, 'eval_samples_per_second': 257.149, 'eval_steps_per_second': 16.27, 'epoch': 7.66, 'step': 10500}\n","{'loss': 0.3039, 'learning_rate': 1.1976659372720643e-05, 'epoch': 8.02, 'step': 11000}\n","{'eval_loss': 0.9787093997001648, 'eval_mse': 0.9787093997001648, 'eval_mae': 0.5103311538696289, 'eval_r2': 0.7501374557177363, 'eval_accuracy': 0.7314814814814815, 'eval_runtime': 2.5138, 'eval_samples_per_second': 257.773, 'eval_steps_per_second': 16.31, 'epoch': 8.02, 'step': 11000}\n","{'loss': 0.2895, 'learning_rate': 1.1611962071480671e-05, 'epoch': 8.39, 'step': 11500}\n","{'eval_loss': 0.9484348893165588, 'eval_mse': 0.9484348297119141, 'eval_mae': 0.470044881105423, 'eval_r2': 0.7578664923897899, 'eval_accuracy': 0.7391975308641975, 'eval_runtime': 2.5139, 'eval_samples_per_second': 257.765, 'eval_steps_per_second': 16.309, 'epoch': 8.39, 'step': 11500}\n","{'loss': 0.2828, 'learning_rate': 1.12472647702407e-05, 'epoch': 8.75, 'step': 12000}\n","{'eval_loss': 0.9191032648086548, 'eval_mse': 0.9191031455993652, 'eval_mae': 0.49125972390174866, 'eval_r2': 0.7653547825924585, 'eval_accuracy': 0.7422839506172839, 'eval_runtime': 2.5174, 'eval_samples_per_second': 257.407, 'eval_steps_per_second': 16.287, 'epoch': 8.75, 'step': 12000}\n","{'loss': 0.2746, 'learning_rate': 1.0882567469000731e-05, 'epoch': 9.12, 'step': 12500}\n","{'eval_loss': 0.9347315430641174, 'eval_mse': 0.9347315430641174, 'eval_mae': 0.47178933024406433, 'eval_r2': 0.7613649068770805, 'eval_accuracy': 0.7361111111111112, 'eval_runtime': 2.513, 'eval_samples_per_second': 257.855, 'eval_steps_per_second': 16.315, 'epoch': 9.12, 'step': 12500}\n","{'loss': 0.251, 'learning_rate': 1.051787016776076e-05, 'epoch': 9.48, 'step': 13000}\n","{'eval_loss': 0.9432949423789978, 'eval_mse': 0.943294882774353, 'eval_mae': 0.4794642925262451, 'eval_r2': 0.7591787013524456, 'eval_accuracy': 0.7268518518518519, 'eval_runtime': 2.5251, 'eval_samples_per_second': 256.619, 'eval_steps_per_second': 16.237, 'epoch': 9.48, 'step': 13000}\n","{'loss': 0.2867, 'learning_rate': 1.0153172866520788e-05, 'epoch': 9.85, 'step': 13500}\n","{'eval_loss': 0.9091032147407532, 'eval_mse': 0.9091032147407532, 'eval_mae': 0.45454132556915283, 'eval_r2': 0.7679077841631738, 'eval_accuracy': 0.7453703703703703, 'eval_runtime': 2.5067, 'eval_samples_per_second': 258.504, 'eval_steps_per_second': 16.356, 'epoch': 9.85, 'step': 13500}\n","{'loss': 0.2841, 'learning_rate': 9.788475565280817e-06, 'epoch': 10.21, 'step': 14000}\n","{'eval_loss': 0.9358775019645691, 'eval_mse': 0.9358775019645691, 'eval_mae': 0.4640760123729706, 'eval_r2': 0.7610723545903177, 'eval_accuracy': 0.7438271604938271, 'eval_runtime': 2.5052, 'eval_samples_per_second': 258.659, 'eval_steps_per_second': 16.366, 'epoch': 10.21, 'step': 14000}\n","{'loss': 0.2489, 'learning_rate': 9.423778264040847e-06, 'epoch': 10.58, 'step': 14500}\n","{'eval_loss': 0.9620466828346252, 'eval_mse': 0.9620466828346252, 'eval_mae': 0.48069870471954346, 'eval_r2': 0.7543914099266968, 'eval_accuracy': 0.7438271604938271, 'eval_runtime': 2.5148, 'eval_samples_per_second': 257.679, 'eval_steps_per_second': 16.304, 'epoch': 10.58, 'step': 14500}\n","{'loss': 0.2671, 'learning_rate': 9.059080962800875e-06, 'epoch': 10.94, 'step': 15000}\n","{'eval_loss': 0.9370319843292236, 'eval_mse': 0.9370319843292236, 'eval_mae': 0.48239073157310486, 'eval_r2': 0.7607776052174111, 'eval_accuracy': 0.7299382716049383, 'eval_runtime': 2.4977, 'eval_samples_per_second': 259.438, 'eval_steps_per_second': 16.415, 'epoch': 10.94, 'step': 15000}\n","{'loss': 0.2251, 'learning_rate': 8.694383661560905e-06, 'epoch': 11.31, 'step': 15500}\n","{'eval_loss': 0.9238748550415039, 'eval_mse': 0.9238749146461487, 'eval_mae': 0.4591164290904999, 'eval_r2': 0.7641365877046751, 'eval_accuracy': 0.7376543209876543, 'eval_runtime': 2.5043, 'eval_samples_per_second': 258.757, 'eval_steps_per_second': 16.372, 'epoch': 11.31, 'step': 15500}\n","{'loss': 0.2564, 'learning_rate': 8.329686360320934e-06, 'epoch': 11.67, 'step': 16000}\n","{'eval_loss': 0.9434264302253723, 'eval_mse': 0.9434265494346619, 'eval_mae': 0.47072479128837585, 'eval_r2': 0.7591451089478789, 'eval_accuracy': 0.7484567901234568, 'eval_runtime': 2.5175, 'eval_samples_per_second': 257.398, 'eval_steps_per_second': 16.286, 'epoch': 11.67, 'step': 16000}\n","{'loss': 0.2802, 'learning_rate': 7.964989059080964e-06, 'epoch': 12.04, 'step': 16500}\n","{'eval_loss': 0.9655452966690063, 'eval_mse': 0.9655451774597168, 'eval_mae': 0.4751320481300354, 'eval_r2': 0.7534982439810854, 'eval_accuracy': 0.7222222222222222, 'eval_runtime': 2.5029, 'eval_samples_per_second': 258.896, 'eval_steps_per_second': 16.381, 'epoch': 12.04, 'step': 16500}\n","{'loss': 0.2562, 'learning_rate': 7.600291757840993e-06, 'epoch': 12.4, 'step': 17000}\n","{'eval_loss': 0.9149975180625916, 'eval_mse': 0.9149974584579468, 'eval_mae': 0.455913782119751, 'eval_r2': 0.7664029758415661, 'eval_accuracy': 0.7438271604938271, 'eval_runtime': 2.501, 'eval_samples_per_second': 259.092, 'eval_steps_per_second': 16.393, 'epoch': 12.4, 'step': 17000}\n","{'loss': 0.2345, 'learning_rate': 7.2355944566010216e-06, 'epoch': 12.76, 'step': 17500}\n","{'eval_loss': 0.9243696331977844, 'eval_mse': 0.9243695139884949, 'eval_mae': 0.46053069829940796, 'eval_r2': 0.7640103004865517, 'eval_accuracy': 0.7515432098765432, 'eval_runtime': 2.5185, 'eval_samples_per_second': 257.3, 'eval_steps_per_second': 16.28, 'epoch': 12.76, 'step': 17500}\n","{'loss': 0.2331, 'learning_rate': 6.87089715536105e-06, 'epoch': 13.13, 'step': 18000}\n","{'eval_loss': 0.9350301623344421, 'eval_mse': 0.9350301623344421, 'eval_mae': 0.4669547379016876, 'eval_r2': 0.761288685356652, 'eval_accuracy': 0.7283950617283951, 'eval_runtime': 2.5097, 'eval_samples_per_second': 258.201, 'eval_steps_per_second': 16.337, 'epoch': 13.13, 'step': 18000}\n","{'loss': 0.2607, 'learning_rate': 6.50619985412108e-06, 'epoch': 13.49, 'step': 18500}\n","{'eval_loss': 0.915799081325531, 'eval_mse': 0.9157989621162415, 'eval_mae': 0.4609695374965668, 'eval_r2': 0.7661983374548564, 'eval_accuracy': 0.7361111111111112, 'eval_runtime': 2.5043, 'eval_samples_per_second': 258.758, 'eval_steps_per_second': 16.372, 'epoch': 13.49, 'step': 18500}\n","{'loss': 0.2482, 'learning_rate': 6.141502552881109e-06, 'epoch': 13.86, 'step': 19000}\n","{'eval_loss': 0.8726477026939392, 'eval_mse': 0.8726477026939392, 'eval_mae': 0.4459306299686432, 'eval_r2': 0.7772147977037966, 'eval_accuracy': 0.75, 'eval_runtime': 2.5099, 'eval_samples_per_second': 258.175, 'eval_steps_per_second': 16.335, 'epoch': 13.86, 'step': 19000}\n","{'loss': 0.2409, 'learning_rate': 5.776805251641139e-06, 'epoch': 14.22, 'step': 19500}\n","{'eval_loss': 0.9090355634689331, 'eval_mse': 0.9090355634689331, 'eval_mae': 0.4852771461009979, 'eval_r2': 0.7679250182905029, 'eval_accuracy': 0.7391975308641975, 'eval_runtime': 2.5146, 'eval_samples_per_second': 257.693, 'eval_steps_per_second': 16.305, 'epoch': 14.22, 'step': 19500}\n","{'loss': 0.1991, 'learning_rate': 5.412107950401167e-06, 'epoch': 14.59, 'step': 20000}\n","{'eval_loss': 0.9128195643424988, 'eval_mse': 0.9128195643424988, 'eval_mae': 0.45591047406196594, 'eval_r2': 0.7669590014723258, 'eval_accuracy': 0.7407407407407407, 'eval_runtime': 2.5219, 'eval_samples_per_second': 256.951, 'eval_steps_per_second': 16.258, 'epoch': 14.59, 'step': 20000}\n","{'loss': 0.2525, 'learning_rate': 5.0474106491611964e-06, 'epoch': 14.95, 'step': 20500}\n","{'eval_loss': 0.9135825037956238, 'eval_mse': 0.9135825037956238, 'eval_mae': 0.45669224858283997, 'eval_r2': 0.7667642033419517, 'eval_accuracy': 0.7376543209876543, 'eval_runtime': 2.5171, 'eval_samples_per_second': 257.439, 'eval_steps_per_second': 16.289, 'epoch': 14.95, 'step': 20500}\n","{'loss': 0.2599, 'learning_rate': 4.682713347921226e-06, 'epoch': 15.32, 'step': 21000}\n","{'eval_loss': 0.9069437384605408, 'eval_mse': 0.9069437384605408, 'eval_mae': 0.5055718421936035, 'eval_r2': 0.7684590817580503, 'eval_accuracy': 0.7438271604938271, 'eval_runtime': 2.5058, 'eval_samples_per_second': 258.604, 'eval_steps_per_second': 16.362, 'epoch': 15.32, 'step': 21000}\n","{'loss': 0.2417, 'learning_rate': 4.318016046681255e-06, 'epoch': 15.68, 'step': 21500}\n","{'eval_loss': 0.9040640592575073, 'eval_mse': 0.9040640592575073, 'eval_mae': 0.4507242441177368, 'eval_r2': 0.7691942550586197, 'eval_accuracy': 0.7422839506172839, 'eval_runtime': 2.5027, 'eval_samples_per_second': 258.916, 'eval_steps_per_second': 16.382, 'epoch': 15.68, 'step': 21500}\n","{'loss': 0.1962, 'learning_rate': 3.953318745441284e-06, 'epoch': 16.05, 'step': 22000}\n","{'eval_loss': 0.9290815591812134, 'eval_mse': 0.9290815591812134, 'eval_mae': 0.4602608382701874, 'eval_r2': 0.7628073420007171, 'eval_accuracy': 0.7407407407407407, 'eval_runtime': 2.5068, 'eval_samples_per_second': 258.5, 'eval_steps_per_second': 16.356, 'epoch': 16.05, 'step': 22000}\n","{'loss': 0.2337, 'learning_rate': 3.5886214442013136e-06, 'epoch': 16.41, 'step': 22500}\n","{'eval_loss': 0.8994207382202148, 'eval_mse': 0.8994206786155701, 'eval_mae': 0.4479749798774719, 'eval_r2': 0.770379696399708, 'eval_accuracy': 0.7453703703703703, 'eval_runtime': 2.5069, 'eval_samples_per_second': 258.487, 'eval_steps_per_second': 16.355, 'epoch': 16.41, 'step': 22500}\n","{'loss': 0.2332, 'learning_rate': 3.223924142961342e-06, 'epoch': 16.78, 'step': 23000}\n","{'eval_loss': 0.9071242809295654, 'eval_mse': 0.9071242809295654, 'eval_mae': 0.4496820569038391, 'eval_r2': 0.7684129953566019, 'eval_accuracy': 0.7422839506172839, 'eval_runtime': 2.5103, 'eval_samples_per_second': 258.135, 'eval_steps_per_second': 16.333, 'epoch': 16.78, 'step': 23000}\n","{'loss': 0.2205, 'learning_rate': 2.8592268417213713e-06, 'epoch': 17.14, 'step': 23500}\n","{'eval_loss': 0.9076851606369019, 'eval_mse': 0.9076851606369019, 'eval_mae': 0.4672510623931885, 'eval_r2': 0.7682697960665454, 'eval_accuracy': 0.7453703703703703, 'eval_runtime': 2.5129, 'eval_samples_per_second': 257.865, 'eval_steps_per_second': 16.316, 'epoch': 17.14, 'step': 23500}\n","{'loss': 0.2117, 'learning_rate': 2.4945295404814006e-06, 'epoch': 17.51, 'step': 24000}\n","{'eval_loss': 0.9266643524169922, 'eval_mse': 0.9266643524169922, 'eval_mae': 0.45673322677612305, 'eval_r2': 0.7634244433560223, 'eval_accuracy': 0.7376543209876543, 'eval_runtime': 2.5112, 'eval_samples_per_second': 258.043, 'eval_steps_per_second': 16.327, 'epoch': 17.51, 'step': 24000}\n","{'loss': 0.2609, 'learning_rate': 2.12983223924143e-06, 'epoch': 17.87, 'step': 24500}\n","{'eval_loss': 0.922858715057373, 'eval_mse': 0.922858715057373, 'eval_mae': 0.45416387915611267, 'eval_r2': 0.7643960211822858, 'eval_accuracy': 0.7361111111111112, 'eval_runtime': 2.5166, 'eval_samples_per_second': 257.494, 'eval_steps_per_second': 16.292, 'epoch': 17.87, 'step': 24500}\n","{'loss': 0.2237, 'learning_rate': 1.765134938001459e-06, 'epoch': 18.23, 'step': 25000}\n","{'eval_loss': 0.8992061018943787, 'eval_mse': 0.8992061018943787, 'eval_mae': 0.4581030309200287, 'eval_r2': 0.7704344887926879, 'eval_accuracy': 0.7438271604938271, 'eval_runtime': 2.51, 'eval_samples_per_second': 258.165, 'eval_steps_per_second': 16.335, 'epoch': 18.23, 'step': 25000}\n","{'loss': 0.2445, 'learning_rate': 1.400437636761488e-06, 'epoch': 18.6, 'step': 25500}\n","{'eval_loss': 0.9036925435066223, 'eval_mse': 0.9036926627159119, 'eval_mae': 0.46084463596343994, 'eval_r2': 0.7692890756103505, 'eval_accuracy': 0.7453703703703703, 'eval_runtime': 2.5072, 'eval_samples_per_second': 258.454, 'eval_steps_per_second': 16.353, 'epoch': 18.6, 'step': 25500}\n","{'loss': 0.193, 'learning_rate': 1.0357403355215171e-06, 'epoch': 18.96, 'step': 26000}\n","{'eval_loss': 0.9125481247901917, 'eval_mse': 0.9125481247901917, 'eval_mae': 0.4459134340286255, 'eval_r2': 0.767028306626111, 'eval_accuracy': 0.7453703703703703, 'eval_runtime': 2.5087, 'eval_samples_per_second': 258.299, 'eval_steps_per_second': 16.343, 'epoch': 18.96, 'step': 26000}\n","{'loss': 0.2095, 'learning_rate': 6.710430342815463e-07, 'epoch': 19.33, 'step': 26500}\n","{'eval_loss': 0.8984403014183044, 'eval_mse': 0.8984403014183044, 'eval_mae': 0.4595937728881836, 'eval_r2': 0.7706299858549827, 'eval_accuracy': 0.7438271604938271, 'eval_runtime': 2.5279, 'eval_samples_per_second': 256.341, 'eval_steps_per_second': 16.219, 'epoch': 19.33, 'step': 26500}\n","{'loss': 0.2319, 'learning_rate': 3.063457330415755e-07, 'epoch': 19.69, 'step': 27000}\n","{'eval_loss': 0.9080169200897217, 'eval_mse': 0.9080169796943665, 'eval_mae': 0.4450893998146057, 'eval_r2': 0.7681851052007992, 'eval_accuracy': 0.7453703703703703, 'eval_runtime': 2.5123, 'eval_samples_per_second': 257.928, 'eval_steps_per_second': 16.32, 'epoch': 19.69, 'step': 27000}\n","{'train_runtime': 5446.5671, 'train_samples_per_second': 80.506, 'train_steps_per_second': 5.034, 'total_flos': 5.768394985156608e+16, 'train_loss': 0.35347716305744553, 'epoch': 20.0, 'step': 27420}\n"]},{"output_type":"display_data","data":{"text/plain":["<IPython.core.display.HTML object>"],"text/html":[]},"metadata":{}},{"output_type":"stream","name":"stdout","text":["[[7.2968984 ]\n"," [6.805175  ]\n"," [6.9671392 ]\n"," [7.297272  ]\n"," [7.4396453 ]\n"," [7.336125  ]\n"," [7.133235  ]\n"," [7.637734  ]\n"," [7.517162  ]\n"," [6.9456115 ]\n"," [6.8466277 ]\n"," [6.304774  ]\n"," [0.04389785]\n"," [1.2097931 ]\n"," [0.04389785]\n"," [0.04389785]\n"," [0.04389785]\n"," [0.04389785]\n"," [0.04389785]\n"," [0.04389785]]\n","0.9356968967811874\n","0.7863637685824509\n","Now whole corpus\n"]},{"output_type":"display_data","data":{"text/plain":["Map:   0%|          | 0/23868 [00:00<?, ? examples/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"9a905030128747dda71e544a218f83c1"}},"metadata":{}},{"output_type":"stream","name":"stdout","text":["Now predicting\n"]},{"output_type":"display_data","data":{"text/plain":["<IPython.core.display.HTML object>"],"text/html":[]},"metadata":{}},{"output_type":"stream","name":"stdout","text":["[[4.7416587]\n"," [4.042534 ]\n"," [4.5959473]\n"," [3.6011248]\n"," [3.95696  ]\n"," [4.033051 ]\n"," [2.9295332]\n"," [3.0732918]\n"," [3.5146055]\n"," [3.4877264]\n"," [4.6582284]\n"," [4.264835 ]\n"," [4.3337755]\n"," [4.6021667]\n"," [3.7693517]\n"," [3.7339664]\n"," [2.9019458]\n"," [3.395866 ]\n"," [2.904875 ]\n"," [3.8887196]]\n","DF saved\n"]},{"output_type":"display_data","data":{"text/plain":["<IPython.core.display.HTML object>"],"text/html":["\n","    <div>\n","      \n","      <progress value='1492' max='1492' style='width:300px; height:20px; vertical-align: middle;'></progress>\n","      [1492/1492 01:31]\n","    </div>\n","    "]},"metadata":{}},{"output_type":"execute_result","data":{"text/plain":["{'eval_loss': 0.28258106112480164,\n"," 'eval_mse': 0.28258106112480164,\n"," 'eval_mae': 0.18581396341323853,\n"," 'eval_r2': 0.9196118178075527,\n"," 'eval_accuracy': 0.9366515837104072,\n"," 'eval_runtime': 91.8081,\n"," 'eval_samples_per_second': 259.977,\n"," 'eval_steps_per_second': 16.251,\n"," 'epoch': 20.0}"]},"metadata":{},"execution_count":3}]}]}